{
 "cells": [
  {
   "cell_type": "code",
   "id": "initial_id",
   "metadata": {
    "collapsed": true,
    "ExecuteTime": {
     "end_time": "2025-10-26T15:02:33.510283Z",
     "start_time": "2025-10-26T15:02:33.489779Z"
    }
   },
   "source": [
    "import pandas as pd\n",
    "house_sales = pd.read_csv('../data/house_sales.csv')\n",
    "\n",
    "house_sales"
   ],
   "outputs": [
    {
     "data": {
      "text/plain": [
       "         id        date      price  bedrooms  bathrooms  sqft_living  \\\n",
       "0         1  2005-10-24  476315.91         8          4         1921   \n",
       "1         2  1937-07-18  698980.64         4          4         1503   \n",
       "2         3  2008-08-01  663024.75         3          3         3494   \n",
       "3         4  2011-08-31  629698.77         8          1         2618   \n",
       "4         5  2011-02-26  658139.54         1          2         1661   \n",
       "...     ...         ...        ...       ...        ...          ...   \n",
       "9995   9996  1953-07-11  303685.99         3          2         2378   \n",
       "9996   9997  2016-01-03  336882.94         2          1         4837   \n",
       "9997   9998  2021-11-12  423961.29         4          4         4750   \n",
       "9998   9999  1969-09-03  394782.02         6          5         4108   \n",
       "9999  10000  1999-11-20  738484.49         8          6         3533   \n",
       "\n",
       "      sqft_lot  floors  waterfront  view  condition  grade  sqft_above  \\\n",
       "0         1856       3           0     0          3      7        1864   \n",
       "1         6659       2           0     1          1      7        2177   \n",
       "2         3112       2           0     3          4     12        2030   \n",
       "3         8264       1           0     2          4      7        1576   \n",
       "4         3386       1           0     3          3      2         517   \n",
       "...        ...     ...         ...   ...        ...    ...         ...   \n",
       "9995      6259       1           0     4          4     13        2398   \n",
       "9996      6226       2           1     2          1      8        2198   \n",
       "9997      1641       2           1     1          2      1        2442   \n",
       "9998      7847       1           0     4          3      1        4226   \n",
       "9999      7641       3           0     0          3      2         937   \n",
       "\n",
       "      sqft_basement  yr_built  yr_renovated  zipcode        lat        long  \n",
       "0                87      1979          2010    98001  47.341860 -122.183176  \n",
       "1               100      1937             0    98010  47.532967 -122.026116  \n",
       "2              1084      1968          1989    98006  47.345444 -121.635418  \n",
       "3              1108      1911          1999    98010  47.749573 -121.794627  \n",
       "4               816      1900             0    98001  47.737984 -121.701806  \n",
       "...             ...       ...           ...      ...        ...         ...  \n",
       "9995            450      1927          1992    98010  47.394280 -121.689675  \n",
       "9996           1567      1986          2006    98003  47.530260 -122.444554  \n",
       "9997            380      2018             0    98004  47.020433 -122.275511  \n",
       "9998           1899      1912             0    98001  47.034089 -122.122351  \n",
       "9999            250      1979             0    98008  47.158349 -121.876240  \n",
       "\n",
       "[10000 rows x 19 columns]"
      ],
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>id</th>\n",
       "      <th>date</th>\n",
       "      <th>price</th>\n",
       "      <th>bedrooms</th>\n",
       "      <th>bathrooms</th>\n",
       "      <th>sqft_living</th>\n",
       "      <th>sqft_lot</th>\n",
       "      <th>floors</th>\n",
       "      <th>waterfront</th>\n",
       "      <th>view</th>\n",
       "      <th>condition</th>\n",
       "      <th>grade</th>\n",
       "      <th>sqft_above</th>\n",
       "      <th>sqft_basement</th>\n",
       "      <th>yr_built</th>\n",
       "      <th>yr_renovated</th>\n",
       "      <th>zipcode</th>\n",
       "      <th>lat</th>\n",
       "      <th>long</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>2005-10-24</td>\n",
       "      <td>476315.91</td>\n",
       "      <td>8</td>\n",
       "      <td>4</td>\n",
       "      <td>1921</td>\n",
       "      <td>1856</td>\n",
       "      <td>3</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>3</td>\n",
       "      <td>7</td>\n",
       "      <td>1864</td>\n",
       "      <td>87</td>\n",
       "      <td>1979</td>\n",
       "      <td>2010</td>\n",
       "      <td>98001</td>\n",
       "      <td>47.341860</td>\n",
       "      <td>-122.183176</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2</td>\n",
       "      <td>1937-07-18</td>\n",
       "      <td>698980.64</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>1503</td>\n",
       "      <td>6659</td>\n",
       "      <td>2</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>7</td>\n",
       "      <td>2177</td>\n",
       "      <td>100</td>\n",
       "      <td>1937</td>\n",
       "      <td>0</td>\n",
       "      <td>98010</td>\n",
       "      <td>47.532967</td>\n",
       "      <td>-122.026116</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>3</td>\n",
       "      <td>2008-08-01</td>\n",
       "      <td>663024.75</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3494</td>\n",
       "      <td>3112</td>\n",
       "      <td>2</td>\n",
       "      <td>0</td>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "      <td>12</td>\n",
       "      <td>2030</td>\n",
       "      <td>1084</td>\n",
       "      <td>1968</td>\n",
       "      <td>1989</td>\n",
       "      <td>98006</td>\n",
       "      <td>47.345444</td>\n",
       "      <td>-121.635418</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>4</td>\n",
       "      <td>2011-08-31</td>\n",
       "      <td>629698.77</td>\n",
       "      <td>8</td>\n",
       "      <td>1</td>\n",
       "      <td>2618</td>\n",
       "      <td>8264</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>2</td>\n",
       "      <td>4</td>\n",
       "      <td>7</td>\n",
       "      <td>1576</td>\n",
       "      <td>1108</td>\n",
       "      <td>1911</td>\n",
       "      <td>1999</td>\n",
       "      <td>98010</td>\n",
       "      <td>47.749573</td>\n",
       "      <td>-121.794627</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>5</td>\n",
       "      <td>2011-02-26</td>\n",
       "      <td>658139.54</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>1661</td>\n",
       "      <td>3386</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>2</td>\n",
       "      <td>517</td>\n",
       "      <td>816</td>\n",
       "      <td>1900</td>\n",
       "      <td>0</td>\n",
       "      <td>98001</td>\n",
       "      <td>47.737984</td>\n",
       "      <td>-121.701806</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9995</th>\n",
       "      <td>9996</td>\n",
       "      <td>1953-07-11</td>\n",
       "      <td>303685.99</td>\n",
       "      <td>3</td>\n",
       "      <td>2</td>\n",
       "      <td>2378</td>\n",
       "      <td>6259</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>13</td>\n",
       "      <td>2398</td>\n",
       "      <td>450</td>\n",
       "      <td>1927</td>\n",
       "      <td>1992</td>\n",
       "      <td>98010</td>\n",
       "      <td>47.394280</td>\n",
       "      <td>-121.689675</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9996</th>\n",
       "      <td>9997</td>\n",
       "      <td>2016-01-03</td>\n",
       "      <td>336882.94</td>\n",
       "      <td>2</td>\n",
       "      <td>1</td>\n",
       "      <td>4837</td>\n",
       "      <td>6226</td>\n",
       "      <td>2</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>1</td>\n",
       "      <td>8</td>\n",
       "      <td>2198</td>\n",
       "      <td>1567</td>\n",
       "      <td>1986</td>\n",
       "      <td>2006</td>\n",
       "      <td>98003</td>\n",
       "      <td>47.530260</td>\n",
       "      <td>-122.444554</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9997</th>\n",
       "      <td>9998</td>\n",
       "      <td>2021-11-12</td>\n",
       "      <td>423961.29</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4750</td>\n",
       "      <td>1641</td>\n",
       "      <td>2</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>1</td>\n",
       "      <td>2442</td>\n",
       "      <td>380</td>\n",
       "      <td>2018</td>\n",
       "      <td>0</td>\n",
       "      <td>98004</td>\n",
       "      <td>47.020433</td>\n",
       "      <td>-122.275511</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9998</th>\n",
       "      <td>9999</td>\n",
       "      <td>1969-09-03</td>\n",
       "      <td>394782.02</td>\n",
       "      <td>6</td>\n",
       "      <td>5</td>\n",
       "      <td>4108</td>\n",
       "      <td>7847</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>4</td>\n",
       "      <td>3</td>\n",
       "      <td>1</td>\n",
       "      <td>4226</td>\n",
       "      <td>1899</td>\n",
       "      <td>1912</td>\n",
       "      <td>0</td>\n",
       "      <td>98001</td>\n",
       "      <td>47.034089</td>\n",
       "      <td>-122.122351</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9999</th>\n",
       "      <td>10000</td>\n",
       "      <td>1999-11-20</td>\n",
       "      <td>738484.49</td>\n",
       "      <td>8</td>\n",
       "      <td>6</td>\n",
       "      <td>3533</td>\n",
       "      <td>7641</td>\n",
       "      <td>3</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>3</td>\n",
       "      <td>2</td>\n",
       "      <td>937</td>\n",
       "      <td>250</td>\n",
       "      <td>1979</td>\n",
       "      <td>0</td>\n",
       "      <td>98008</td>\n",
       "      <td>47.158349</td>\n",
       "      <td>-121.876240</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>10000 rows × 19 columns</p>\n",
       "</div>"
      ]
     },
     "execution_count": 5,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "execution_count": 5
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 2
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython2",
   "version": "2.7.6"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
